@ARTICLE{Andrew,
	AUTHOR = "Andrew W Moore",
	TITLE = "An intoductory tutorial on kd-trees",
	JOURNAL = "Technical Report No 209, Computer Laboratory, University of Cambridge",
	YEAR = {1991}	}

@ARTICLE{Lloyd,
	AUTHOR = "S. P. Lloyd",
	TITLE = "Least Squares Quantization in PCM",
	JOURNAL = "IEEE Trans. Information Theory",
	VOLUME = {28},
	NUMBER = {129-137},
	YEAR = {1982}	}

@ARTICLE{Alsabti,
	AUTHOR = "Khaled Alsabti and Sanjay Ranka and Vineeth Singh",
	TITLE = "An Efficient K Means Clustering Algorithm",
	JOURNAL = "First Workshop High Performance Data Mining",
	MONTH = "March",
	YEAR = {1998}	}

@ARTICLE{Kanungo2002,
	AUTHOR = "Tapas Kanungo and David M. Mount and Nathan S. Netanyahu and Christine D. Piatko and Ruth Silverman and
Angela Y. Wu",
	TITLE = "An efficient k-means clustering algorithm: analysis and implementation",
	JOURNAL = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
	VOLUME = {24},
	NUMBER = {7},
	MONTH = "July",
	YEAR = {2002}	}

@ARTICLE{Zhang,
	AUTHOR = "Yongpeng Zhang and Frank Mueller and Xiaohui Cui and Thomas Potok ",
	TITLE = "GPU-accelerated text mining",
	JOURNAL = {Workshop on Exploiting Parallelism using GPUs and other Hardware-Assisted Methods},
	MONTH = "March", 
	YEAR = {2009}	}
	

@ARTICLE{Wu2009,
	AUTHOR = "Ren Wu and Bin Zhang and Meichun Hsu ",
	TITLE = "Clustering Billions of Data Points Using GPUs",
	JOURNAL = {Proceedings of the combined workshops on UnConventional high performance computing workshop plus memory access workshop},
	YEAR = {2009}	}
	
@ARTICLE{Li,
	AUTHOR = "You Li and Kaiyong Zhao and Xiaowen Chu and Jiming Liu",
	TITLE = "Speeding up K-Means Algorithm by GPUs",
	JOURNAL = {IEEE International Conference on Computer and Information Technology},
	YEAR = {2010}	}
	
		
@ARTICLE{Shalom2008,
	AUTHOR = "S.A. Arul Shalom and Manoranjan Dash and Minh Tue",
	TITLE = "Efficient K-Means Clustering Using Accelerated Graphics Processors",
	JOURNAL = {Proceedings of the 13th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming},
	YEAR = {2008}	}
	
@ARTICLE{Hall2004,
	AUTHOR = "Jesse D. Hall and John C. Hart",
	TITLE = "GPU Acceleration of Iterative Clustering",
	JOURNAL = {ACM Workshop on General-Purpose Computing on Graphics Processors},
	YEAR = {2004}	}
	
	@ARTICLE{Cao,
	AUTHOR = "Feng Cao and Anthony K.H. Tung and Aoying Zhou",
	TITLE = "Scalable Clustering Using Graphics Processors",
	JOURNAL = "WAIM 2006. LNCS, vol. 4016. Springer",
	YEAR = {2006}}
	
@ARTICLE{Fang2008,
	AUTHOR = "Wenbin Fang and Ka Keung Lau and Mian Lu and Xiangye Xiao and Chi Kit Lam and Philip Yang Yang and Bingsheng He1 and Qiong Luo and Pedro V. Sander and Ke Yang",
	TITLE = "Parallel data mining on graphics processors.",
	JOURNAL = {Technical Report HKUST-CS08-07},
	YEAR = {2008}	}
	
@ARTICLE{Che2008,
	AUTHOR = "Shuai Che and Jiayuan Meng and JeremyW. Sheaffer and Kevin Skadron",
	TITLE = "A Performance Study of General Purpose Applications on Graphics Processors",
	JOURNAL = {First Workshop on General Purpose Processing on Graphics Processing Unit},
	YEAR = {2007}	}

@ARTICLE{Debunk,
	AUTHOR = "Victor W. Lee and Changkyu Kim 	and Jatin Chhugani and Michael Deisher and Daehyun Kim 	I
	and Anthony D. Nguyen 
	and Nadathur Satish 	
	and Mikhail Smelyanskiy 	
	and Srinivas Chennupaty 	
	and Per Hammarlund 
	and Ronak Singhal 	I
	and Pradeep Dubey",
	TITLE = "Debunking the 100X GPU vs. CPU myth: an evaluation of throughput computing on CPU and GPU",
	JOURNAL = {Proceedings of the 37th annual international symposium on Computer architecture},
	YEAR = {2010}	}


@ARTICLE{darjen2,
	AUTHOR = "DarJen Chang and Mehmed Kantardzic and Ming Ouyang",
	TITLE = "Hierarchical clustering with CUDA/GPU",
	JOURNAL = {Technical Report HKUST-CS08-07},
	YEAR = {2008}	}
	
@ARTICLE{darjen,
	AUTHOR = "Darjen Chang and Nathaniel A. Jones and Dazhuo Li and Ming Ouyang and Rammohan K. Ragade",
	TITLE = "COMPUTE PAIRWISE EUCLIDEAN DISTANCES OF DATA POINTS WITH GPUS",
  JOURNAL = {Proceedings of the IASTED International Symposium on Computational Biology and Bioinformatics},
	YEAR = {2008}}

@ARTICLE{darjen1,
  AUTHOR = "DarJen Chang and Ahmed H. Desoky and Ming Ouyang and Eric C. Rouchka", 
	TITLE = "Compute pairwise Manhattan distance and Pearson correlation coefficient of data points with GPU.",
JOURNAL = {Proceedings of 10th ACIS International Conference on Software Engineering, Artificial Intelligence, Networking and Parallel/Distributed Computing
(SNPD)},
YEAR = {2009}}
	
@ARTICLE{Ryoo2008,
	AUTHOR = "Shane Ryoo and Christopher I. Rodrigues and Sara S. Baghsorkhi and Sam S. Stone and David B. Kirk and Wen-mei W. Hwu",
	TITLE = "Optimization principles and application performance evaluation of a multithreaded GPU using CUDA",
	JOURNAL = {Proceedings of the 13th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming},
	YEAR = {2008}	}
	
@ARTICLE{ensem2008,
   AUTHOR = "Bryan Orme and Rich Johnson", 
   TITLE = "Improving K-Means Cluster Analysis: Ensemble Analysis Instead of Highest Reproducibility Replicates",
   YEAR = {2008}
}

@ARTICLE{ensem2009,
   AUTHOR = "Eun-Youn Kim and Seon-Young Kim and Daniel Ashlock and Dougu Nam",
   TITLE = "MULTI-K: accurate classification of microarray subtypes using ensemble k-means clustering",
	 JOURNAL = "BMC Bioinformatics",
	 YEAR = {2009}
	}
	 

@MANUAL{oclprgramming,
	TITLE = "OpenCL Programming Guide for the CUDA Architecture",
	ORGANIZATION  = "NVIDIA",
	EDITION = "3.2",
	YEAR = "2010"	}

@MANUAL{oclbestpractices,
	TITLE = "OpenCL Best Practices Guide",
	ORGANIZATION  = "NVIDIA",
	YEAR = "2010"	}
	
@MANUAL{oclspec,
	TITLE = "The OpenCL Specification",
	ORGANIZATION  = "Khronos group",
	EDITION = "1.1",
	YEAR = "2010"	}
	
@MANUAL{cuda,
   TITLE = "NVIDIA CUDA Reference Manual",
	 ORGANIZATION = "NVIDIA",
	 EDITION = "3.2",
	 YEAR	= "2010" }
   